gxl_scp_root_dir="/home/work_nfs8/xlgeng/aslp_spider_data"
gxl_k2_root_dir="/home/work_nfs10/data/aslp_spider_data_k2_fbank"
big_name='pici_45093H'
second_name='tiqianpi_1_3500H'
split_num=500
num_thread_for_manifest=8
num_thread_for_fbank=8
node='node2'

. /home/work_nfs8/xlgeng/new_workspace/wenet_gxl_salmonn/examples/aishell/salmonn/tools/parse_options.sh || exit 1;

wav_scp_path=$gxl_scp_root_dir/$big_name/$second_name/$node/wav.scp
text_scp_path=$gxl_scp_root_dir/$big_name/$second_name/$node/text
output_dir=$gxl_k2_root_dir/$big_name/$second_name/$node
partition="train"
prefix="aslp-spider-data"

#python do_split_and_concat.py
python main.py --wav_scp_path $wav_scp_path --text_scp_path $text_scp_path --output_dir $output_dir --split_num $split_num --num_thread_for_manifest $num_thread_for_manifest --partition $partition --prefix $prefix --num_thread_for_fbank $num_thread_for_fbank
